/** 
 * File-Name:IParser.java
 *
 * Created on 2010-11-21 下午07:59:52
 * 
 * @author: Neo (neolimeng@gmail.com)
 * Software Engineering Institute, Peking University, China
 * 
 * Copyright (c) 2009, Peking University
 * 
 *
 */
package org.neocrawler.parser;

import java.util.List;

import org.neocrawler.entity.WebContent;

/**
 * Description: The interfaces that a parser has to implement.
 * 
 * @author: Neo (neolimeng@gmail.com) Software Engineering Institute, Peking
 *          University, China
 * @version 1.0 2010-11-21 下午07:59:52
 */
public interface IParser {
	String TYPE_SEED = "SEEDS";

	/**
	 * 
	 * Description:Get the initial seeds.
	 * 
	 * @return List<WebContent>
	 */
	List<WebContent> getInitialSeeds();

	/**
	 * 
	 * Description:Parse the new crawled web pages, and generate new
	 * WebContents.
	 * 
	 * @param webContent
	 * @param webPage
	 * @return List<WebContent>
	 */
	List<WebContent> parse(WebContent webContent, String webPage);
}
